PC World 2007 June

home *** CD-ROM | disk | FTP | other *** search

/ PC World 2007 June / PCWorld_2007-06_cd.bin / temacd / wikipad / WikidPad-1.9beta2.exe / {app} / extensions / WikiSyntax.py < prev

Wrap

Text File | 2007-02-24 | 11KB | 260 lines

import locale import string import pwiki.srePersistent as re from pwiki.StringOps import mbcsDec locale.setlocale(locale.LC_ALL, '') # String containing the delimiter between the title of a wiki word (to show in # HTML and the real word, as e.g. [title | WikiWord] TitleWikiWordDelimiter = ur"|" # Same, escaped for regular expression TitleWikiWordDelimiterPAT = ur"\|" PlainCharacterPAT = ur"(?:[^\\]|\\.)" PlainEscapedCharacterRE = re.compile(ur"\\(.)", re.DOTALL | re.UNICODE | re.MULTILINE) # PlainCharactersRE = re.compile(PlainCharacterPAT + "+", # re.DOTALL | re.UNICODE | re.MULTILINE) # basic formatting BoldRE = re.compile(ur"\*(?=\S)(?P<boldContent>" + PlainCharacterPAT + ur"+?)\*", re.DOTALL | re.UNICODE | re.MULTILINE) ItalicRE = re.compile(ur"\b_(?P<italicContent>" + PlainCharacterPAT + ur"+?)_\b", re.DOTALL | re.UNICODE | re.MULTILINE) HtmlTagRE = re.compile( ur"</?[A-Za-z][A-Za-z0-9]*(?:/| [^\n>]*)?>", re.DOTALL | re.UNICODE | re.MULTILINE) Heading4RE = re.compile(u"^\\+\\+\\+\\+(?!\\+) ?(?P<h4Content>" + PlainCharacterPAT + ur"+?)\n", re.DOTALL | re.UNICODE | re.MULTILINE) Heading3RE = re.compile(u"^\\+\\+\\+(?!\\+) ?(?P<h3Content>" + PlainCharacterPAT + ur"+?)\n", re.DOTALL | re.UNICODE | re.MULTILINE) Heading2RE = re.compile(u"^\\+\\+(?!\\+) ?(?P<h2Content>" + PlainCharacterPAT + ur"+?)\n", re.DOTALL | re.UNICODE | re.MULTILINE) Heading1RE = re.compile(u"^\\+(?!\\+) ?(?P<h1Content>" + PlainCharacterPAT + ur"+?)\n", re.DOTALL | re.UNICODE | re.MULTILINE) # UrlRE = re.compile(ur'(?:(?:wiki|file|https?|ftp|rel)://|mailto:)[^"\s<>]*', # re.DOTALL | re.UNICODE | re.MULTILINE) # SPN UrlRE = re.compile(ur'(?:(?:wiki|file|https?|ftp|rel)://|mailto:)' ur'(?:(?![.,;:!?)]+["\s])[^"\s<>])*(?:>\S+)?', re.DOTALL | re.UNICODE | re.MULTILINE) # SPN TitledUrlRE = re.compile( ur"\[(?P<titledurlUrl>" + UrlRE.pattern + ur")" ur"(?:(?P<titledurlDelim>[ \t]*" + TitleWikiWordDelimiterPAT + ur")" ur"(?P<titledurlTitle>" + PlainCharacterPAT + ur"+?))?\]", re.DOTALL | re.UNICODE | re.MULTILINE) # The following 2 are not in WikiFormatting.FormatExpressions BulletRE = re.compile(ur"^(?P<indentBullet>[ \t]*)(?P<actualBullet>\*[ \t])", re.DOTALL | re.UNICODE | re.MULTILINE) # SPN NumericBulletRE = re.compile(ur"^(?P<indentNumeric>[ \t]*)(?P<preLastNumeric>(?:\d+\.)*)(\d+)\.[ \t]", re.DOTALL | re.UNICODE | re.MULTILINE) # SPN # WikiWords #WikiWordRE = re.compile(r"\b(?<!~)(?:[A-Z\xc0-\xde\x8a-\x8f]+[a-z\xdf-\xff\x9a-\x9f]+[A-Z\xc0-\xde\x8a-\x8f]+[a-zA-Z0-9\xc0-\xde\x8a-\x8f\xdf-\xff\x9a-\x9f]*|[A-Z\xc0-\xde\x8a-\x8f]{2,}[a-z\xdf-\xff\x9a-\x9f]+)\b") #WikiWordRE2 = re.compile("\[[a-zA-Z0-9\-\_\s]+?\]") # TODO To unicode UPPERCASE = mbcsDec(string.uppercase)[0] LOWERCASE = mbcsDec(string.lowercase)[0] LETTERS = UPPERCASE + LOWERCASE # # Pattern string for delimiter for search fragment after wiki word # WikiWordSearchFragDelimPAT = ur"#" # # # Pattern string for search fragment itself # WikiWordSearchFragPAT = ur"(?:#.|[^ \t\n#])+" singleWikiWord = (ur"(?:[" + UPPERCASE + # "A-Z\xc0-\xde\x8a-\x8f" ur"]+[" + LOWERCASE + # "a-z\xdf-\xff\x9a-\x9f" ur"]+[" + UPPERCASE + # "A-Z\xc0-\xde\x8a-\x8f" ur"]+[" + LETTERS + string.digits + # "a-zA-Z0-9\xc0-\xde\x8a-\x8f\xdf-\xff\x9a-\x9f" ur"]*|[" + UPPERCASE + # "A-Z\xc0-\xde\x8a-\x8f" ur"]{2,}[" + LOWERCASE + # "a-z\xdf-\xff\x9a-\x9f" ur"]+)") WikiWordRE = re.compile(ur"\b(?<!~)" + singleWikiWord + ur"\b", # ur"(?:/" + singleWikiWord + # ur")*\b", re.DOTALL | re.UNICODE | re.MULTILINE) AnchorStart = ur"!" AnchorStartPAT = ur"!" # Special version for syntax highlighting to allow appending search expression with '#' WikiWordEditorRE = re.compile(ur"(?P<wikiword>" + WikiWordRE.pattern + ur")(?:#(?P<wikiwordSearchfrag>(?:(?:#.)|[^ \t\n#])+)|" + AnchorStartPAT + ur"(?P<wikiwordAnchorfrag>[A-Za-z0-9\_]+))?", re.DOTALL | re.UNICODE | re.MULTILINE) # Only to exclude them from WikiWordRE2 FootnoteRE = re.compile(ur"\[[0-9]+?\]", re.DOTALL | re.UNICODE | re.MULTILINE) # Pattern string for non camelcase wiki word WikiWordNccPAT = ur"[\w\-\_ \t]+?" WikiWordRE2 = re.compile(ur"\[(?:" + WikiWordNccPAT + ur")\]", re.DOTALL | re.UNICODE | re.MULTILINE) # Special version for syntax highlighting to allow appending search expression with '#' # WikiWordEditorRE2 = re.compile( # ur"\[(?P<wikiwordnccTitle>[^\]\|]+" + TitleWikiWordDelimiterPAT + ur"\s*)?" # ur"(?P<wikiwordncc>" + WikiWordNccPAT + ur")\]" # ur"(?:#(?P<wikiwordnccSearchfrag>(?:(?:#.)|[^ \t\n#])+))?", # re.DOTALL | re.UNICODE | re.MULTILINE) WikiWordEditorRE2 = re.compile( ur"\[(?P<wikiwordncc>" + WikiWordNccPAT + ur")" ur"(?:(?P<wikiwordnccDelim>[ \t]*" + TitleWikiWordDelimiterPAT + ur")" ur"(?P<wikiwordnccTitle>" + PlainCharacterPAT + ur"+?))?\]" ur"(?:#(?P<wikiwordnccSearchfrag>(?:(?:#.)|[^ \t\n#])+)|" + AnchorStartPAT + ur"(?P<wikiwordnccAnchorfrag>[A-Za-z0-9\_]+))?", re.DOTALL | re.UNICODE | re.MULTILINE) SearchFragmentUnescapeRE = re.compile(ur"#(.)", re.DOTALL | re.UNICODE | re.MULTILINE) # For spell checking TextWordRE = re.compile(ur"(?P<negative>[0-9]+|"+ UrlRE.pattern + u"|" + WikiWordRE.pattern + ur")|\b[\w']+", re.DOTALL | re.UNICODE | re.MULTILINE) # SP only # parses the dynamic properties PropertyRE = re.compile(ur"\[[ \t]*(?P<propertyName>[\w\-\_\.]+?)[ \t]*" + ur"[=:][ \t]*(?P<propertyValue>[\w\-\_ \t:;,.!?#/|]+?)\]", re.DOTALL | re.UNICODE | re.MULTILINE) # InsertionRE = re.compile(ur"\[:[ \t]*(?P<insertionKey>[\w\-\_\.]+?)[ \t]*" + # ur"[:][ \t]*(?P<insertionValue>[\w\-\_ \t;,.!?#/|]+?)\]", # re.DOTALL | re.UNICODE | re.MULTILINE) InsertionValueRE = re.compile(ur"(?:(?P<insertionValue>[\w][\w\-\_ \t,.!?#/|]*)|" ur"(?P<insertionQuoteStarter>\"+|'+|/+|\\+)" ur"(?P<insertionQuotedValue>.*?)(?P=insertionQuoteStarter))", re.DOTALL | re.UNICODE | re.MULTILINE) InsertionAppendixRE = re.compile(ur";[ \t]*(?:" ur"(?P<insertionAppendix>[\w][\w\-\_ \t,.!?#/|]*)|" ur"(?P<insertionApxQuoteStarter>\"+|'+|/+|\\+)" ur"(?P<insertionQuotedAppendix>.*?)(?P=insertionApxQuoteStarter))", re.DOTALL | re.UNICODE | re.MULTILINE) InsertionRE = re.compile(ur"\[:[ \t]*(?P<insertionKey>[\w][\w\-\_\.]*)[ \t]*" + ur":[ \t]*(?P<insertionContent>" + InsertionValueRE.pattern + ur"(?:" + InsertionAppendixRE.pattern + ur")*)\]", re.DOTALL | re.UNICODE | re.MULTILINE) # Reverse REs for autocompletion revSingleWikiWord = (ur"(?:[" + LETTERS + string.digits + ur"]*[" + UPPERCASE+ ur"])") RevWikiWordRE = re.compile(ur"^" + # revSingleWikiWord + ur"(?:/" + revSingleWikiWord + ur"(?![\~])\b", re.DOTALL | re.UNICODE | re.MULTILINE) # SPN RevWikiWordRE2 = re.compile(ur"^[\w\-\_ \t.]+?\[", re.DOTALL | re.UNICODE | re.MULTILINE) # SPN RevPropertyValue = re.compile(ur"^([\w\-\_ \t:;,.!?#/|]*?)([ \t]*[=:][ \t]*)([\w\-\_ \t\.]+?)\[", re.DOTALL | re.UNICODE | re.MULTILINE) # SPN # script blocks ScriptRE = re.compile(u"\<%(.*?)%\>", re.DOTALL) # Auto generated area AutoGenAreaRE = re.compile(ur"^([ \t]*<<[ \t]+)([^\n]+\n)(.*?)^([ \t]*>>[ \t]*\n)", re.DOTALL | re.LOCALE | re.MULTILINE) # todos, captures the todo item text ## ToDoREWithContent = re.compile(u"^\s*((?:todo|action|track|issue|question|project)\\.?[^\\:\\s]*:[^\\r\\n]+)", re.MULTILINE) ToDoREWithContent = re.compile(ur"\b(?P<todoIndent>)" # ur"(?P<todoIndent>^[ \t]*)" ur"(?P<todoName>(?:todo|done|wait|action|track|issue|question|project)(?:\.[^:\s]+)?)" ur"(?P<todoDelimiter>:)(?P<todoValue>" + PlainCharacterPAT + ur"+?)(?:$|(?=\|))", re.DOTALL | re.UNICODE | re.MULTILINE) # todos, used in the tree control to parse saved todos. Because they were # already identified as todos, the regexp can be quite simple ToDoREWithCapturing = re.compile(ur"^([^:\s]+):[ \t]*(.+?)$", re.DOTALL | re.UNICODE | re.MULTILINE) # used to detect indent levels # The following 2 are not in WikiFormatting.FormatExpressions EmptyLineRE = re.compile(ur"^[ \t\r\n]*$", re.DOTALL | re.UNICODE | re.MULTILINE) HorizLineRE = re.compile(u"----+", re.DOTALL | re.UNICODE | re.MULTILINE) # suppression expression # Orig: SuppressHighlightingRE = re.compile("\<\<(.*?)\>\>", re.DOTALL) SuppressHighlightingRE = re.compile(ur"^(?P<suppressIndent>[ \t]*)<<[ \t]*\n"+ ur"(?P<suppressContent>.*?)\n[ \t]*>>[ \t]*$", re.DOTALL | re.UNICODE | re.MULTILINE) AnchorRE = re.compile(ur"^[ \t]*anchor:[ \t]*(?P<anchorValue>[A-Za-z0-9\_]+)\n", re.DOTALL | re.UNICODE | re.MULTILINE) TableRowDelimiterPAT = ur"\n" TableRE = re.compile(ur"(?P<tableBegin>^[ \t]*<<\|[ \t]*$)" ur"(?P<tableContent>" + PlainCharacterPAT + ur"*?)(?P<tableEnd>^[ \t]*>>[ \t]*$)", re.DOTALL | re.UNICODE | re.MULTILINE) PreBlockRE = re.compile(ur"(?P<preBegin>^[ \t]*<<pre[ \t]*\n)" ur"(?P<preContent>." # + PlainCharacterPAT + ur"*?)(?P<preEnd>\n[ \t]*>>[ \t]*$(\n)?)", re.DOTALL | re.UNICODE | re.MULTILINE)